@Misc{ROSE,
title = {The {ROSE} Compiler},
note = {http://wwww.rosecompiler.org/}
}

@inproceedings{EuroPar2011,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{PER2011,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{CJ2011,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{OP2-User,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{InPar2012,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{liszt,
 author = {DeVito, Zachary and Joubert, Niels and Palacios, Francisco and Oakley, Stephen and Medina, Montserrat and Barrientos, Mike and Elsen, Erich and Ham, Frank and Aiken, Alex and Duraisamy, Karthik and Darve, Eric and Alonso, Juan and Hanrahan, Pat},
 title = {Liszt: a domain specific language for building portable mesh-based {PDE} solvers},
 booktitle = {Proceedings of 2011 International Conference for High Performance Computing, Networking, Storage and Analysis},
 series = {SC '11},
 year = {2011},
 isbn = {978-1-4503-0771-0},
 location = {Seattle, Washington},
 pages = {9:1--9:12},
 articleno = {9},
 numpages = {12},
 url = {http://doi.acm.org/10.1145/2063384.2063396},
 doi = {10.1145/2063384.2063396},
 acmid = {2063396},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {compiler analysis and program transformations, programming and runtime environments for high performance and high throughput computing},
} 


@Misc{scala,
 title = {The {SCALA} {P}rogramming {L}anguage},
 note = {\url{http://www.scala-lang.org/}}
}

@Misc{openacc,
 title = {{OpenACC}: {D}irectives {F}or {A}ccelerators },
 note = {\url{http://www.openacc-standard.org/}}
}

@inproceedings{CF2012,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{oplus_a,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}

@inproceedings{oplus_b,
 author = {},
 title = {deleted for double-blind review},
 year = {},
 series = {},
}



@inproceedings{sblock,
 author = {Brandvik, Tobias and Pullan, Graham},
 title = {{SBLOCK}: A Framework for Efficient Stencil-Based {PDE} Solvers on
Multi-core Platforms},
 booktitle = {Proceedings of the 2010 10th IEEE International Conference on
Computer and Information Technology},
 series = {CIT '10},
 year = {2010},
 isbn = {978-0-7695-4108-2},
 pages = {1181--1188},
 numpages = {8},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA},
} 

@Article{Hydra,
  author = 	 {M.B. Giles and M.C. Duta and J.-D. Muller and N.A. Pierce},
  title = 	 {Algorithm developments for discrete adjoint methods},
  journal = 	 {AIAA Journal},
  year = 	 {2003},
  OPTkey = 	 {},
  volume = 	 {41},
  number = 	 {2},
  pages = 	 {198--205},
  OPTmonth = 	 {},
  OPTnote = 	 {},
  OPTannote = 	 {}
}

@inproceedings{inspect-execute,
    Month = {June},
    Year = {2003},
    Title = {Compile-time Composition of Run-time Data and Iteration
             Reorderings},
  Booktitle = {Proceedings of the 2003 {ACM} {SIGPLAN}  Conference on
               Programming Language Design and Implementation (PLDI)},
    Author = {Michelle Mills Strout and Larry Carter and Jeanne
              Ferrante},
  pages = {91--102},
  location = {New York, NY, USA}
}

@inproceedings{stencil-gpu-1,
 author = {Maruyama, Naoya and Nomura, Tatsuo and Sato, Kento and Matsuoka, Satoshi},
 title = {Physis: an implicitly parallel programming model for stencil computations on large-scale {GPU}-accelerated supercomputers},
 booktitle = {Proceedings of 2011 International Conference for High Performance Computing, Networking, Storage and Analysis},
 series = {SC '11},
 year = {2011},
 isbn = {978-1-4503-0771-0},
 location = {Seattle, Washington},
 pages = {11:1--11:12},
 articleno = {11},
 numpages = {12},
 url = {http://doi.acm.org/10.1145/2063384.2063398},
 doi = {10.1145/2063384.2063398},
 acmid = {2063398},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {application framework, domain specific languages, high perforamnce computing},
} 

@inproceedings{matrixmul-gpu-sc11,
 author = {Tan, Guangming and Li, Linchuan and Triechle, Sean and Phillips, Everett and Bao, Yungang and Sun, Ninghui},
 title = {Fast implementation of {DGEMM} on {Fermi} {GPU}},
 booktitle = {Proceedings of 2011 International Conference for High Performance Computing, Networking, Storage and Analysis},
 series = {SC '11},
 year = {2011},
 isbn = {978-1-4503-0771-0},
 location = {Seattle, Washington},
 pages = {35:1--35:11},
 articleno = {35},
 numpages = {11},
 url = {http://doi.acm.org/10.1145/2063384.2063431},
 doi = {10.1145/2063384.2063431},
 acmid = {2063431},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {CUDA, GPU, high performance computing, matrix-matrix multiplication},
}

@Misc{OpenMP,
  key = 	 {openmp},
  OPTauthor = 	 {},
  title = 	 {{OpenMP} forum},
  howpublished = {webiste},
  OPTmonth = 	 {},
  OPTyear = 	 {},
  note = 	 {http://openmp.org/wp/},
  OPTannote = 	 {}
}

@Misc{hydra-website,
  OPTkey = 	 {hydra},
  OPTauthor = 	 {},
  title = 	 {{HYDRA website at Rolls Royce Plc.}},
  OPThowpublished = {},
  OPTmonth = 	 {},
  OPTyear = 	 {},
  note = 	 {http://www.rolls-royce.com/technology\_innovation/systems\_tech/design\_systems\_tools.jsp},
  OPTannote = 	 {}
}

@article{metis,
 author = {Karypis, George and Kumar, Vipin},
 title = {A Fast and High Quality Multilevel Scheme for Partitioning Irregular Graphs},
 journal = {SIAM J. Sci. Comput.},
 issue_date = {Aug. 1998},
 volume = {20},
 number = {1},
 month = dec,
 year = {1998},
 issn = {1064-8275},
 pages = {359--392},
 numpages = {34},
 acmid = {305248},
 publisher = {Society for Industrial and Applied Mathematics},
 address = {Philadelphia, PA, USA},
 keywords = {fill-reducing orderings, finite element computations, graph partitioning, parallel computations},
}

@TechReport{nasarotor37-1,
  author = 	 {L. Reid and D. Moore},
  title = 	 {Design and overall performance of four highly loaded, high-speed inlet stages for an advanced high-pressure-ratio core compressor},
  institution =  {NASA},
  year = 	 {1978},
  OPTkey = 	 {},
  OPTtype = 	 {},
  OPTnumber = 	 {},
  OPTaddress = 	 {},
  OPTmonth = 	 {},
  note = 	 {TP-1337},
  OPTannote = 	 {}
}



@Article{nasarotor37-2,
  author = 	 {J. Dunham and G. Meauze},
  title = 	 {An {AGARD} working group study of {3D} {Navier}-{Stokes} codes applied to single turbomachinery blade rows},
  journal = 	 {ASME},
  year = 	 {1998},
  OPTkey = 	 {},
  volume = 	 {},
  number = 	 {},
  pages = 	 {},
  OPTmonth = 	 {},
  OPTnote = 	 {},
  OPTannote = 	 {}
}

@INPROCEEDINGS{activelibrary,
    author = {Todd L. Veldhuizen and Dennis Gannon},
    title = {Active Libraries: Rethinking the roles of compilers and libraries},
    booktitle = {In Proceedings of the SIAM Workshop on Object Oriented Methods for Inter-operable Scientific and Engineering Computing (OO’98},
    year = {1998},
    publisher = {SIAM Press}
}


@Misc{kepler,
  OPTkey = 	 {},
  OPTauthor = 	 {},
  title = 	 {Whitepaper - {NVIDIA} {GeForce} {GTX} 680},
  OPThowpublished = {},
  OPTmonth = 	 {},
  year = 	 {2012},
  note = 	 {http://www.geforce.com/Active/en\_US/en\_US/pdf/GeForce-GTX-680-Whitepaper-FINAL.pdf},
  OPTannote = 	 {}
}


@Manual{cuda-C,
  title = 	 {CUDA C Programming Guide},
  OPTkey = 	 {},
  OPTauthor = 	 {},
  OPTorganization = {},
  OPTaddress = 	 {},
  OPTedition = 	 {},
  OPTmonth = 	 {},
  OPTyear = 	 {},
note =
{\url{
http://developer.download.nvidia.com/compute/DevZone/docs/html/C/doc/CUDA_C_Prog
ramming_Guide.pdf}
}

@Manual{cuda-FORTRAN,
  title = 	 {CUDA Fortran - Programming Guide and Reference},
  OPTkey = 	 {},
  OPTauthor = 	 {},
  OPTorganization = {},
  OPTaddress = 	 {},
  OPTedition = 	 {},
  OPTmonth = 	 {},
  OPTyear = 	 {},
  note = 	 {http://www.pgroup.com/doc/pgicudafortug.pdf},
  OPTannote = 	 {}
}


@inproceedings{jerome,
 author = {Meredith, Jeremy S. and Sisneros, Robert and Pugmire, David and Ahern, Sean},
 title = {A distributed data-parallel framework for analysis and visualization algorithm development},
 booktitle = {Proceedings of the 5th Annual Workshop on General Purpose Processing with Graphics Processing Units},
 series = {GPGPU-5},
 year = {2012},
 isbn = {978-1-4503-1233-2},
 location = {London, England},
 pages = {11--19},
 numpages = {9},
 url = {http://doi.acm.org/10.1145/2159430.2159432},
 doi = {10.1145/2159430.2159432},
 acmid = {2159432},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {GPGPU, analysis, visualization},
} 

@inproceedings{tau,
 author = {J\"{a}gersk\"{u}pper, Jens and Simmendinger, Christian},
 title = {A novel shared-memory thread-pool implementation for hybrid parallel CFD solvers},
 booktitle = {Proceedings of the 17th international conference on Parallel processing - Volume Part II},
 series = {Euro-Par'11},
 year = {2011},
 isbn = {978-3-642-23396-8},
 location = {Bordeaux, France},
 pages = {182--193},
 numpages = {12},
 url = {http://dl.acm.org/citation.cfm?id=2033408.2033429},
 acmid = {2033429},
 publisher = {Springer-Verlag},
 address = {Berlin, Heidelberg},
} 